# thing is useful for debugging.
dominfo.setName('migrating-' + domain_name)
- done_suspend = 0
-
try:
dominfo.migrateDevices(network, dst, DEV_MIGRATE_STEP1, domain_name)
log.debug("Suspending %d ...", dominfo.getDomid())
dominfo.shutdown('suspend')
dominfo.waitForShutdown()
- done_suspend = 1
dominfo.migrateDevices(network, dst, DEV_MIGRATE_STEP2,
domain_name)
log.info("Domain %d suspended.", dominfo.getDomid())
pass
except Exception, exn:
- log.exception("Save failed on domain %s (%s).", domain_name,
+ log.exception("Save failed on domain %s (%s) - resuming.", domain_name,
dominfo.getDomid())
-
- # If we didn't get as far as suspending the domain (for
- # example, we couldn't balloon enough memory for the new
- # domain), then we don't want to re-plumb the devices, as the
- # domU will not be expecting it.
- if done_suspend:
- log.debug("XendCheckpoint.save: resumeDomain")
- dominfo.resumeDomain()
+ dominfo.resumeDomain()
try:
dominfo.setName(domain_name)
sock.send("receive\n")
sock.recv(80)
- XendCheckpoint.save(sock.fileno(), dominfo, True, live, dst, node=node)
- sock.close()
+ try:
+ XendCheckpoint.save(sock.fileno(), dominfo, True, live, dst, node=node)
+ finally:
+ sock.close()
def domain_save(self, domid, dst, checkpoint=False):
"""Start saving a domain to file.
def resumeDomain(self):
log.debug("XendDomainInfo.resumeDomain(%s)", str(self.domid))
- if self.domid is None:
+ # resume a suspended domain (e.g. after live checkpoint, or after
+ # a later error during save or migate); checks that the domain
+ # is currently suspended first so safe to call from anywhere
+
+ xeninfo = dom_get(self.domid)
+ if xeninfo is None:
+ return
+ if not xeninfo['shutdown']:
return
+ reason = shutdown_reason(xeninfo['shutdown_reason'])
+ if reason != 'suspend':
+ return
+
try:
# could also fetch a parsed note from xenstore
fast = self.info.get_notes().get('SUSPEND_CANCEL') and 1 or 0